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Syntax 
<Bddy> 

rib. oA <Generahzed1> 

<Atom1> 
<Atom2> 



USER SELECTED CONTENT 


GENERALIZED CONTENT 


CATEGORIES 172 

ANTIQUES & ART 
BOOKS. MOVIES Si MUSIC 
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<Atom2> — 186 

<Grp2> 

<Generalized2> 

<Atom3> — 1 86 
<Atom4>— ^186 



194 



180 



FIG. 9A 



1QR 



10/22 



188 

USER SELECTED CONTENT 



190 

GENERALIZED CONTENT 



Speciality Sites 

AUTOMOTIVE 
BUSINESS EXCHANGE 

Categories 

ANTIQUES S ART 
BOOKS. MOVIES & MUSIC 



Specialty Sites 

AUTOMOTIVE 
BUSINESS EXCHANGE 
GREAT COLLECTIONS 
HALF.COM (AN EBAY COMPANY) 

Categories 

ANTldUES & ART 
BOOKS. MOVIES & MUSIC 
COINS & STAMPS 
COLLECTIBLES 
COMPUTERS 
DOLLS. FIGURES 
JEWELRY. GEMSTONES 
PHOTO & ELECTRONICS 
POTTERY & GLASS 
REAL ESTATE new 1 . 
SPORTS 

TOYSJBEAN BAG PLUSH 
EVERYTHING ELSE 
ALL CATEGORIES.. . 



FIG. 9C 



11/22 



generalized displayname= n Generalized 1"> 

<include> 

otomic xhtmlsourceid="131" displayname="Automotive "> 
<content> 

<contentitem id="1" sourceid="131" displayname="Content ltem"> 



<pathelement type= 
<pathelement type= 
<pathelement type= 
<pathelement type= 
<pathelement type= 
<pathelement type=' 
<pathelementtype=' 
<pathelement type=' 
<pathelement type= 
<pathelement type= 
<pathelement type= 
</contentitem> 

</content> 

<attributes> 

<class value="10,20 l 307> 

<align value="left"/> 

<name value="Automotive"/> 
</attribufces> 
</atomic> 



"html" order= n 1 7> 
'body" order="1 7> 
"table" order= n 27> 
'tr"order=T/> 
'td M order="1 7> 
table" order="1 V> 
Y order="27> 
td" order="27> 
font" order="1 7> 
b"order=T/> 
a"order=T/> 



A 2 



FIG. 10A 1 



A 2 
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J 



£ b\ 

<atomic xhtmlsourceid="133" displayname="Business Exchange "> 
<content> 

<contentitem id="1 "sourceid="1 33" displayname="Content ltem"> 

<pathelement type="html" order=T'/> 

<pathelement type="body" order="17> 

<pathelement type="table" order="27> 

<pathelement type="tr" order="1 "/> 

<pathelement type="td" order="1 7> 

<pathelement type="table" order="17> 

<pathelement type=V order="27> 

<pathelement type="td" order="27> 
<pathelement type="font" order= M 1"/> 

<pathelement type="b" order="1 7> 

<pathelement type="a" order= n 2'7> 

</contentitem> 
</content> 
<attributes> 

<classvalue="10,20 l 307> 

<alignvalue="left7> 

<name value="Business Exchange 7> 

</attributes> 

</atomic> 

</include> 
</generalized> 

FIG. 1DA 2 
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202 

B. INTERMEDIATE FILE (AFTER GENERALIZATION) 

<group displayname='Specialty"> 
<attributes> 

<classvalue="10 ) 20 ) 3Q7> 
<sequential value="sequential"/> 
<alignvalue="left"/> 
<name value="Specialty"/> 
</attributes> 

otomic displayname="Automotive " xhtmlsourceid="131"> 
<content> 

<contentitem displayname="Content Item" id=T sourceid="1317> 
</content> 
<attributes> 

<classvalue="10 l 20,307> 
<align value="left7> 

<name enumerate="enumerate" value="Automotive 7> 
</attributes> 

<xhtmlpath generalized="tme"> 
<pathelement order="-1" type="a7> 

</xhtmlpath> 
</atomic> 
<xhtmlpath> 

<pathelement axis="descendant::" order="-1 " predicate="child::a and 
</xhtm!path> child::font"type="b7> 

</grou p> 

FIG. 10B1 2 
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<group displayname="Categories"> 
<attributes> 

<classvalue="10 l 20,307> 
<sequential value="sequential7> 
<align value=MV> 
<namevalue="Categories7> 
</attributes> 

<atomic displayname="Antiques and Art " xhtmlsourceid="1 5B"> 
<content> 

<contentitem displayname="Content Item" id="1 " sourceid="1 587> 
</content> 
<attributes> 

<classvalue="10,20 l 307> 
<alignvalue="left7> 

<name enumerate="enumerate" value="Antiques and Art 7> 
</attributes> 

<xhtmlpath generalized="true"> 
<pathelement order="-1" type="a7> 

</xhtmlpath> 
</atomic> 
<xhtmlpath> 

<pathelement axis="descendant::" order="-1 " predicate="child::a and 
</xhtmlpath> child::img" type: 

</group> 
<xhtmlpath> 

<pathelement order="1 " type="body7> 

</xhtmlpath> 
</group> 
<xhtmlpath> 

<pathelement order="-1 "predicate=" ancestor: :document[@page=Tl 



</xhtmlpath> 
</arm!> 
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c) Final Stylesheet 



1 5/2 2 The relevant portion of the final 



XSL Stylesheet generated as a 
result of the generalization as 
depicted in the example of 



<xsl:template match="body" mode="Body"> Case - 2 is given below - 



<group class="1 0,20,30 name="Body sequential="sequential"> 
<xsl :apply-templates select='descendant: :bfchild: :a and child::font)' mode='SpecialtyV> 
<xsl:apply-templates select="descendant::blchild::a and child::imgJ" mode='Categories"/> 
</group> 
</xsi:template> 

<xsl:template match="b" mode= ,, Speciaity"> 

<group class="1 0,20,30" sequential="sequential" align="left" name="Specialty"> 
<xsl:apply-templates select="a" mode="Automotive~"/> 

<Apup> 
</xsl:template> 

<xsl:template match="b" mode="Categories"> 

<group class="1 0,20,30" sequential sequential" align=left" name="Categories"> 
<xsl:apply-templates select="a" mode="Antiques~and~Art~"/> 

</qroup> 
</xsI:template> 

<xsl:template match="a" mode="Automotive~"> 
<atomic class="1 0,20,30" align="left" name="Automotive"> 
<a href=l/@href}"> 

<xsl:value-of select="normalize-space(.)"/> 
</a> 

</atomic> 
</xsl:template> 

<xsl:template match="a" mode="Antiques~and~Art~"> 
<atomic class="1 0,20,30" align="left" name="Antiques and Art "> 
<a href="{./@href}"> 

<xsl:value-ofselect="normalize-space(.)7> 
</a> 

</atomic> 

</xsl:template> FIG 10C 
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Syntax 
<Body> 

<Generalized1> 

f <Grp1> //R1.C1 

212 <Atom1> \ 01C 

I <Atom2> -^ >21B 

r <Grp2> //R1.C2 

?14 <Atom3> \n 1c 

] <Atom4> - >21B 
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Syntax 
<Body> 

<Generalized1> 
f<Grp1> 



232 



234 



<Atom1> 
<Atom2> 
<Grp2> 

<Atom3>^. OQC 
<f\tomA>- :>eiSb 



//R1.C1 
236 
//R2.C1 
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<Body> 

<Generalized1> 
'<Grp1> 
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Syntax 
<Body> 

<Generalized1> 
f<Grp1> 



272 



274 



270 



276 
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<generalized> *~ 
<group> 
<group> 

<atomic> 
<atomic> 
<atomic> 
<group> 

<group> 

<generalized> 
<atomic> 
<atomic> 

<atomic> 
<generalized> 
<group> 

<generalized> 
<group> 
<atomic> 
<atomic> 
<group> 
<atomic> 
<atomic> 

<group> 

<generalized> 
<group> 
<atomic> 
<atomic> 
<group> 
<atomic> 
<atomic> 

<group> 

<group> 

<atomic> 
<atomic> 
<atomic> 
<group> 

<group> 

<generalized> 
<atomic> 
<atomic> 

<atomic> 



